1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19 package org.apache.hadoop.hbase;
20
21 import java.io.Serializable;
22 import java.util.Comparator;
23
24 import org.apache.hadoop.hbase.KeyValue.Type;
25 import org.apache.hadoop.hbase.classification.InterfaceAudience;
26 import org.apache.hadoop.hbase.classification.InterfaceStability;
27 import org.apache.hadoop.hbase.util.Bytes;
28
29 import com.google.common.primitives.Longs;
30
31
32
33
34
35
36
37
38 @edu.umd.cs.findbugs.annotations.SuppressWarnings(
39 value="UNKNOWN",
40 justification="Findbugs doesn't like the way we are negating the result of a compare in below")
41 @InterfaceAudience.Private
42 @InterfaceStability.Evolving
43 public class CellComparator implements Comparator<Cell>, Serializable {
44 private static final long serialVersionUID = -8760041766259623329L;
45
46 @Override
47 public int compare(Cell a, Cell b) {
48 return compare(a, b, false);
49 }
50
51
52
53
54
55
56
57
58
59
60
61 public static int compare(final Cell a, final Cell b, boolean ignoreSequenceid) {
62
63 int c = compareRows(a, b);
64 if (c != 0) return c;
65
66 c = compareWithoutRow(a, b);
67 if(c != 0) return c;
68
69 if (!ignoreSequenceid) {
70
71
72 return Longs.compare(b.getMvccVersion(), a.getMvccVersion());
73 } else {
74 return c;
75 }
76 }
77
78 public static int findCommonPrefixInRowPart(Cell left, Cell right, int rowCommonPrefix) {
79 return findCommonPrefix(left.getRowArray(), right.getRowArray(), left.getRowLength()
80 - rowCommonPrefix, right.getRowLength() - rowCommonPrefix, left.getRowOffset()
81 + rowCommonPrefix, right.getRowOffset() + rowCommonPrefix);
82 }
83
84 private static int findCommonPrefix(byte[] left, byte[] right, int leftLength, int rightLength,
85 int leftOffset, int rightOffset) {
86 int length = Math.min(leftLength, rightLength);
87 int result = 0;
88
89 while (result < length && left[leftOffset + result] == right[rightOffset + result]) {
90 result++;
91 }
92 return result;
93 }
94
95 public static int findCommonPrefixInFamilyPart(Cell left, Cell right, int familyCommonPrefix) {
96 return findCommonPrefix(left.getFamilyArray(), right.getFamilyArray(), left.getFamilyLength()
97 - familyCommonPrefix, right.getFamilyLength() - familyCommonPrefix, left.getFamilyOffset()
98 + familyCommonPrefix, right.getFamilyOffset() + familyCommonPrefix);
99 }
100
101 public static int findCommonPrefixInQualifierPart(Cell left, Cell right,
102 int qualifierCommonPrefix) {
103 return findCommonPrefix(left.getQualifierArray(), right.getQualifierArray(),
104 left.getQualifierLength() - qualifierCommonPrefix, right.getQualifierLength()
105 - qualifierCommonPrefix, left.getQualifierOffset() + qualifierCommonPrefix,
106 right.getQualifierOffset() + qualifierCommonPrefix);
107 }
108
109
110
111 public static boolean equals(Cell a, Cell b){
112 return equalsRow(a, b)
113 && equalsFamily(a, b)
114 && equalsQualifier(a, b)
115 && equalsTimestamp(a, b)
116 && equalsType(a, b);
117 }
118
119 public static boolean equalsRow(Cell a, Cell b){
120 return Bytes.equals(
121 a.getRowArray(), a.getRowOffset(), a.getRowLength(),
122 b.getRowArray(), b.getRowOffset(), b.getRowLength());
123 }
124
125 public static boolean equalsFamily(Cell a, Cell b){
126 return Bytes.equals(
127 a.getFamilyArray(), a.getFamilyOffset(), a.getFamilyLength(),
128 b.getFamilyArray(), b.getFamilyOffset(), b.getFamilyLength());
129 }
130
131 public static boolean equalsQualifier(Cell a, Cell b){
132 return Bytes.equals(
133 a.getQualifierArray(), a.getQualifierOffset(), a.getQualifierLength(),
134 b.getQualifierArray(), b.getQualifierOffset(), b.getQualifierLength());
135 }
136
137 public static boolean equalsTimestamp(Cell a, Cell b){
138 return a.getTimestamp() == b.getTimestamp();
139 }
140
141 public static boolean equalsType(Cell a, Cell b){
142 return a.getTypeByte() == b.getTypeByte();
143 }
144
145 public static int compareColumns(final Cell left, final Cell right) {
146 int lfoffset = left.getFamilyOffset();
147 int rfoffset = right.getFamilyOffset();
148 int lclength = left.getQualifierLength();
149 int rclength = right.getQualifierLength();
150 int lfamilylength = left.getFamilyLength();
151 int rfamilylength = right.getFamilyLength();
152 int diff = compare(left.getFamilyArray(), lfoffset, lfamilylength, right.getFamilyArray(),
153 rfoffset, rfamilylength);
154 if (diff != 0) {
155 return diff;
156 } else {
157 return compare(left.getQualifierArray(), left.getQualifierOffset(), lclength,
158 right.getQualifierArray(), right.getQualifierOffset(), rclength);
159 }
160 }
161
162 public static int compareFamilies(Cell left, Cell right) {
163 return Bytes.compareTo(left.getFamilyArray(), left.getFamilyOffset(), left.getFamilyLength(),
164 right.getFamilyArray(), right.getFamilyOffset(), right.getFamilyLength());
165 }
166
167 public static int compareQualifiers(Cell left, Cell right) {
168 return Bytes.compareTo(left.getQualifierArray(), left.getQualifierOffset(),
169 left.getQualifierLength(), right.getQualifierArray(), right.getQualifierOffset(),
170 right.getQualifierLength());
171 }
172
173 public int compareFlatKey(Cell left, Cell right) {
174 int compare = compareRows(left, right);
175 if (compare != 0) {
176 return compare;
177 }
178 return compareWithoutRow(left, right);
179 }
180
181
182
183
184
185 public static int compareRows(final Cell left, final Cell right) {
186 return Bytes.compareTo(left.getRowArray(), left.getRowOffset(), left.getRowLength(),
187 right.getRowArray(), right.getRowOffset(), right.getRowLength());
188 }
189
190
191
192
193
194 public static int compareRows(byte[] left, int loffset, int llength, byte[] right, int roffset,
195 int rlength) {
196 return Bytes.compareTo(left, loffset, llength, right, roffset, rlength);
197 }
198
199 public static int compareWithoutRow(final Cell leftCell, final Cell rightCell) {
200
201
202
203
204
205
206
207 if (leftCell.getFamilyLength() + leftCell.getQualifierLength() == 0
208 && leftCell.getTypeByte() == Type.Minimum.getCode()) {
209
210 return 1;
211 }
212 if (rightCell.getFamilyLength() + rightCell.getQualifierLength() == 0
213 && rightCell.getTypeByte() == Type.Minimum.getCode()) {
214 return -1;
215 }
216 boolean sameFamilySize = (leftCell.getFamilyLength() == rightCell.getFamilyLength());
217 if (!sameFamilySize) {
218
219
220 return Bytes.compareTo(leftCell.getFamilyArray(), leftCell.getFamilyOffset(),
221 leftCell.getFamilyLength(), rightCell.getFamilyArray(), rightCell.getFamilyOffset(),
222 rightCell.getFamilyLength());
223 }
224 int diff = compareColumns(leftCell, rightCell);
225 if (diff != 0) return diff;
226
227 diff = compareTimestamps(leftCell, rightCell);
228 if (diff != 0) return diff;
229
230
231
232
233
234 return (0xff & rightCell.getTypeByte()) - (0xff & leftCell.getTypeByte());
235 }
236
237 public static int compareTimestamps(final Cell left, final Cell right) {
238 long ltimestamp = left.getTimestamp();
239 long rtimestamp = right.getTimestamp();
240 return compareTimestamps(ltimestamp, rtimestamp);
241 }
242
243
244
245
246
247
248
249 public static int hashCode(Cell cell){
250 if (cell == null) {
251 return 0;
252 }
253
254 int hash = calculateHashForKeyValue(cell);
255 hash = 31 * hash + (int)cell.getMvccVersion();
256 return hash;
257 }
258
259
260
261
262
263
264
265
266
267 public static int hashCodeIgnoreMvcc(Cell cell) {
268 if (cell == null) {
269 return 0;
270 }
271
272 int hash = calculateHashForKeyValue(cell);
273 return hash;
274 }
275
276 private static int calculateHashForKeyValue(Cell cell) {
277
278 int rowHash = Bytes.hashCode(cell.getRowArray(), cell.getRowOffset(), cell.getRowLength());
279 int familyHash =
280 Bytes.hashCode(cell.getFamilyArray(), cell.getFamilyOffset(), cell.getFamilyLength());
281 int qualifierHash = Bytes.hashCode(cell.getQualifierArray(), cell.getQualifierOffset(),
282 cell.getQualifierLength());
283
284
285 int hash = 31 * rowHash + familyHash;
286 hash = 31 * hash + qualifierHash;
287 hash = 31 * hash + (int)cell.getTimestamp();
288 hash = 31 * hash + cell.getTypeByte();
289 return hash;
290 }
291
292
293
294
295 public static boolean areKeyLengthsEqual(Cell a, Cell b) {
296 return a.getRowLength() == b.getRowLength()
297 && a.getFamilyLength() == b.getFamilyLength()
298 && a.getQualifierLength() == b.getQualifierLength();
299 }
300
301 public static boolean areRowLengthsEqual(Cell a, Cell b) {
302 return a.getRowLength() == b.getRowLength();
303 }
304
305
306
307
308 private static int compare(byte[] left, int leftOffset, int leftLength, byte[] right,
309 int rightOffset, int rightLength) {
310 return Bytes.compareTo(left, leftOffset, leftLength, right, rightOffset, rightLength);
311 }
312
313 public static int compareCommonRowPrefix(Cell left, Cell right, int rowCommonPrefix) {
314 return compare(left.getRowArray(), left.getRowOffset() + rowCommonPrefix, left.getRowLength()
315 - rowCommonPrefix, right.getRowArray(), right.getRowOffset() + rowCommonPrefix,
316 right.getRowLength() - rowCommonPrefix);
317 }
318
319 public static int compareCommonFamilyPrefix(Cell left, Cell right,
320 int familyCommonPrefix) {
321 return compare(left.getFamilyArray(), left.getFamilyOffset() + familyCommonPrefix,
322 left.getFamilyLength() - familyCommonPrefix, right.getFamilyArray(),
323 right.getFamilyOffset() + familyCommonPrefix,
324 right.getFamilyLength() - familyCommonPrefix);
325 }
326
327 public static int compareCommonQualifierPrefix(Cell left, Cell right,
328 int qualCommonPrefix) {
329 return compare(left.getQualifierArray(), left.getQualifierOffset() + qualCommonPrefix,
330 left.getQualifierLength() - qualCommonPrefix, right.getQualifierArray(),
331 right.getQualifierOffset() + qualCommonPrefix, right.getQualifierLength()
332 - qualCommonPrefix);
333 }
334
335
336
337
338
339 public static boolean equalsIgnoreMvccVersion(Cell a, Cell b){
340 return 0 == compareStaticIgnoreMvccVersion(a, b);
341 }
342
343 private static int compareStaticIgnoreMvccVersion(Cell a, Cell b) {
344
345 int c = compareRows(a, b);
346 if (c != 0) return c;
347
348
349 c = compareColumns(a, b);
350 if (c != 0) return c;
351
352
353 c = compareTimestamps(a, b);
354 if (c != 0) return c;
355
356
357 c = (0xff & b.getTypeByte()) - (0xff & a.getTypeByte());
358 return c;
359 }
360
361 private static int compareTimestamps(final long ltimestamp, final long rtimestamp) {
362
363
364
365
366 if (ltimestamp < rtimestamp) {
367 return 1;
368 } else if (ltimestamp > rtimestamp) {
369 return -1;
370 }
371 return 0;
372 }
373
374
375
376
377 public static class RowComparator extends CellComparator {
378 @Override
379 public int compare(Cell a, Cell b) {
380 return compareRows(a, b);
381 }
382 }
383
384
385
386
387
388
389
390
391
392
393
394 public static Cell getMidpoint(final KeyValue.KVComparator comparator, final Cell left,
395 final Cell right) {
396
397
398 if (right == null) {
399 throw new IllegalArgumentException("right cell can not be null");
400 }
401 if (left == null) {
402 return right;
403 }
404
405
406
407 if (comparator != null && comparator instanceof KeyValue.MetaComparator) {
408 return right;
409 }
410 int diff = compareRows(left, right);
411 if (diff > 0) {
412 throw new IllegalArgumentException("Left row sorts after right row; left=" +
413 CellUtil.getCellKeyAsString(left) + ", right=" + CellUtil.getCellKeyAsString(right));
414 }
415 if (diff < 0) {
416
417 byte [] midRow = getMinimumMidpointArray(left.getRowArray(), left.getRowOffset(),
418 left.getRowLength(),
419 right.getRowArray(), right.getRowOffset(), right.getRowLength());
420
421 if (midRow == null) return right;
422 return CellUtil.createCell(midRow);
423 }
424
425 diff = compareFamilies(left, right);
426 if (diff > 0) {
427 throw new IllegalArgumentException("Left family sorts after right family; left=" +
428 CellUtil.getCellKeyAsString(left) + ", right=" + CellUtil.getCellKeyAsString(right));
429 }
430 if (diff < 0) {
431 byte [] midRow = getMinimumMidpointArray(left.getFamilyArray(), left.getFamilyOffset(),
432 left.getFamilyLength(),
433 right.getFamilyArray(), right.getFamilyOffset(), right.getFamilyLength());
434
435 if (midRow == null) return right;
436
437 return CellUtil.createCell(right.getRowArray(), right.getRowOffset(), right.getRowLength(),
438 midRow, 0, midRow.length, HConstants.EMPTY_BYTE_ARRAY, 0,
439 HConstants.EMPTY_BYTE_ARRAY.length);
440 }
441
442 diff = compareQualifiers(left, right);
443 if (diff > 0) {
444 throw new IllegalArgumentException("Left qualifier sorts after right qualifier; left=" +
445 CellUtil.getCellKeyAsString(left) + ", right=" + CellUtil.getCellKeyAsString(right));
446 }
447 if (diff < 0) {
448 byte [] midRow = getMinimumMidpointArray(left.getQualifierArray(), left.getQualifierOffset(),
449 left.getQualifierLength(),
450 right.getQualifierArray(), right.getQualifierOffset(), right.getQualifierLength());
451
452 if (midRow == null) return right;
453
454 return CellUtil.createCell(right.getRowArray(), right.getRowOffset(), right.getRowLength(),
455 right.getFamilyArray(), right.getFamilyOffset(), right.getFamilyLength(),
456 midRow, 0, midRow.length);
457 }
458
459 return right;
460 }
461
462
463
464
465
466
467
468
469
470
471
472 private static byte [] getMinimumMidpointArray(final byte [] leftArray, final int leftOffset,
473 final int leftLength,
474 final byte [] rightArray, final int rightOffset, final int rightLength) {
475
476 int minLength = leftLength < rightLength ? leftLength : rightLength;
477 short diffIdx = 0;
478 while (diffIdx < minLength &&
479 leftArray[leftOffset + diffIdx] == rightArray[rightOffset + diffIdx]) {
480 diffIdx++;
481 }
482 byte [] minimumMidpointArray = null;
483 if (diffIdx >= minLength) {
484
485 minimumMidpointArray = new byte[diffIdx + 1];
486 System.arraycopy(rightArray, rightOffset, minimumMidpointArray, 0, diffIdx + 1);
487 } else {
488 int diffByte = leftArray[leftOffset + diffIdx];
489 if ((0xff & diffByte) < 0xff && (diffByte + 1) < (rightArray[rightOffset + diffIdx] & 0xff)) {
490 minimumMidpointArray = new byte[diffIdx + 1];
491 System.arraycopy(leftArray, leftOffset, minimumMidpointArray, 0, diffIdx);
492 minimumMidpointArray[diffIdx] = (byte) (diffByte + 1);
493 } else {
494 minimumMidpointArray = new byte[diffIdx + 1];
495 System.arraycopy(rightArray, rightOffset, minimumMidpointArray, 0, diffIdx + 1);
496 }
497 }
498 return minimumMidpointArray;
499 }
500 }